Last updated on Monday, October 06, 2025
@inproceedings{LamkanfiMSR2013,
address = {Piscataway, NJ, USA},
author = {Lamkanfi, Ahmed and P{\'e}rez, Javier and
Demeyer, Serge},
booktitle = {Proceedings {MSR}'13 (10th {IEEE} Working Conference
on Mining Software Repositories)},
note = {Acceptance ratio (Data Track): 15/27 = 55.6\%},
pages = {203 -- 206},
publisher = {{IEEE} Press},
series = {MSR '13},
title = {The eclipse and mozilla defect tracking dataset: a
genuine dataset for mining bug information},
year = {2013},
abstract = {The analysis of bug reports is an important subfield
within the mining software repositories community. It
explores the rich data available in defect tracking
systems to uncover interesting and actionable
information about the bug triaging process. While bug
data is readily accessible from systems like Bugzilla
and JIRA, a common database schema and a curated
dataset could significantly enhance future research
because it allows for easier replication.
Consequently, in this paper we propose the Eclipse
and Mozilla Defect Tracking Dataset, a representative
database of bug data, filtered to contain only
genuine defects (i.e., no feature requests) and
designed to cover the whole bug-triage life cycle
(i.e., store all intermediate actions). We have used
this dataset ourselves for predicting bug severity,
for studying bug- fixing time and for identifying
erroneously assigned components. Sharing these data
with the rest of the community will allow for
reproducibility, validation and comparison of the
results obtained in bug-report analyses and
experiments.},
annote = {internationalconference},
doi = {10.1109/MSR.2013.6624028},
isbn = {978-1-4673-2936-1},
}